import json, random
from collections import defaultdict, Counter

def similarity(w1,w2):
	return random.random()

vocabulary = []

with open("topics_extracted_from_0-65189.txt",'r') as f:
	temp = defaultdict(list,json.loads(f.readline()))

for t in topics:
	for w in t:
		vocabulary.append(w)


a = []

while len(vocabulary) > 1:
	similar = defaultdict(float)
	word = vocabulary.pop()
	for item in vocabulary:
		similar[item] = similarity(word,item)
	print len(vocabulary)
	
